CUDA_VISIBLE_DEVICES=1 python -m vllm.entrypoints.openai.api_server --served-model-name Qwen2.5-7B-Instruct --model /home/LB14787_linux/jinke/models/qwen2.5_7b_instruct --port 10425